import requests
from bs4 import BeautifulSoup
import  csv
def get_html(url):
    head = {"User-Agent":"Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/122.0.0.0 Safari/537.36"}
    try:
        r = requests.get(url=url, headers=head)
        r.encoding = r.apparent_encoding
        r.raise_for_status()
        return r.text
    except Exception as e:
        print(e)

def parser(html):
    soup = BeautifulSoup(html,'lxml')
    out_list = []

    for row in soup.select('#pane-news ul>li'):
        row_data = [
            row.select('a')[0].text,
            row.select('a')[0].attrs['href']
        ]
        out_list.append(row_data)
    return out_list

def save_csv(path,shuju):
    with open(path,'w+',encoding='utf-8',newline='')as f:
        csv_write = csv.writer(f)
        csv_write.writerows(shuju)
if __name__ == '__main__':
    url = 'https://news.baidu.com/'
    html = get_html(url)
    out_list =parser(html)
    path = 'd:\\news.csv'
    save_csv(path,out_list)